from nanovllm import LLM, SamplingParams
llm = LLM("/home/linzhixin/test_field/open_source_model/Qwen/Qwen3-0.6B/", enforce_eager=True, tensor_parallel_size=1)
sampling_params = SamplingParams(temperature=0.6, max_tokens=1024)
prompts = ["你好，你是谁"]
outputs = llm.generate(prompts, sampling_params)
print(outputs[0]["text"])